%% This BibTeX bibliography file was created using BibDesk.
%% http://bibdesk.sourceforge.net/


%% Created for Brian Tanner at 2009-02-17 11:53:22 -0700 


%% Saved with string encoding Unicode (UTF-8) 
@inproceedings{ng:iser04,
  author    = {Andrew Y. Ng and
               Adam Coates and
               Mark Diel and
               Varun Ganapathi and
               Jamie Schulte and
               Ben Tse and
               Eric Berger and
               Eric Liang},
  title     = {Autonomous Inverted Helicopter Flight via Reinforcement
               Learning},
  booktitle = {Proceedings of the International Symposium on Experimental Robotics},
  year      = {2004},
  pages     = {363-372},
  ee        = {http://dx.doi.org/10.1007/11552246_35},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}
@Article{crites:mlj98,
  author       = "Robert H. Crites and Andrew G. Barto",
  title	       = "Elevator Group Control Using Multiple Reinforcement
                  Learning Agents",
  journal      = "Machine Learning",
  volume       = 33,
  number       = "2-3",
  pages	       = "235-262",
  year	       = 1998,
}
@Article{tesauro:nc94,
  author       = "Gerald Tesauro",
  title	       = "{TD}-Gammon, A Self-Teaching Backgammon Program
                  Achieves Master-Level Play ",
  journal      = "Neural Computation",
  year	       = 1994,
  volume       = 6,
  pages	       = "215-219",
}


@url{rllibrary,
	Author = {Brian Tanner and Adam White},
	Date-Added = {2009-02-17 11:48:50 -0700},
	Date-Modified = {2009-02-17 11:53:18 -0700},
	Lastchecked = {Feb 2009},
	Month = {February},
	Title = {The Reinforcement Learning Library},
	Url = {http://library.rl-community.org},
	Year = {2009}}

@article{chow:68,
	Author = {C. K. Chow and C. N. Liu},
	Journal = {IEEE Transactions on Information Theory},
	Number = {3},
	Pages = {462--467},
	Title = {Approximating discrete probability distributions with dependence trees},
	Volume = {IT-14},
	Year = {1968}}

@article{rlsurvey,
	Author = {Leslie Pack Kaelbling and Michael L. Littman and Andrew W. Moore},
	Journal = {Journal of Artificial Intelligence Research},
	Pages = {237--285},
	Title = {Reinforcement learning: a survey},
	Volume = {4},
	Year = {1996}}

@book{ndp,
	Author = {Bertsekas, Dimitri  P.  and Tsitsiklis, John  N. },
	Citeulike-Article-Id = {206209},
	Howpublished = {Hardcover},
	Isbn = {1886529108},
	Keywords = {optimization, programming, reinforcement},
	Month = {May},
	Posted-At = {2007-07-27 20:43:16},
	Priority = {3},
	Publisher = {{Athena Scientific}},
	Title = {Neuro-Dynamic Programming (Optimization and Neural Computation Series, 3)},
	Year = {1996}}

@book{rlbook,
	Address = {Cambridge, Massachusetts},
	Author = {Richard S. Sutton and Andrew G. Barto},
	Publisher = {The MIT Press},
	Title = {Reinforcement {L}earning:      {A}n {I}ntroduction },
	Year = {1998}}

@book{mitchell:97,
	Address = {New York, New York},
	Author = {Tom M. Mitchell},
	Publisher = {McGraw Hill},
	Title = {Machine {L}earning},
	Year = {1997}}

@inproceedings{smart:00,
	Author = {William D. Smart and Leslie Pack Kaelbling},
	Booktitle = {Proc. 17th International Conf. on Machine Learning},
	Pages = {903--910},
	Publisher = {Morgan Kaufmann, San Francisco, CA},
	Title = {Practical Reinforcement Learning in Continuous Spaces},
	Year = {2000}}

@inproceedings{boyan:95,
	Address = {Cambridge, MA},
	Author = {Justin A. Boyan and Andrew W. Moore},
	Booktitle = {Advances in Neural Information Processing Systems 7},
	Editor = {G. Tesauro and D. S. Touretzky and T. K. Leen},
	Pages = {369--376},
	Publisher = {The MIT Press},
	Title = {Generalization in Reinforcement Learning: {S}afely Approximating the Value Function},
	Year = {1995}}

@inproceedings{wiewiora:03,
	Author = {Eric Wiewiora and Garrison W. Cottrell and Charles Elkan},
	Booktitle = {International Conference on Machine Learning},
	Pages = {792--799},
	Title = {Principled Methods for Advising Reinforcement Learning Agents.},
	Year = {2003}}

@phdthesis{moore:90,
	Address = {Cambridge, UK},
	Author = {A. W. Moore},
	School = {University of Cambridge},
	Title = {Efficient Memory-based Learning for Robot Control},
	Year = {1990}}

@mastersthesis{whitethesis,
	Address = {Alberta, Canada},
	Author = {Adam White},
	School = {University of Alberta},
	Title = {A {S}tandard {S}ystem for {B}enchmarking in {R}einforcement {L}earning},
	Year = {2006}}

@article{singh:96,
	Author = {Satinder P. Singh and Richard S. Sutton},
	Journal = {Machine Learning},
	Number = {1--3},
	Pages = {123--158},
	Title = {Reinforcement Learning with Replacing Eligibility Traces},
	Volume = {22},
	Year = {1996}}

@article{whitesutton,
	Author = {Adam White and Richard S. Sutton},
	Journal = {Journal of Machine Learning Research},
	Number = {??},
	Pages = {??},
	Title = {The {RL}-{G}lue {P}rotocol: a {C}ommunication {S}tandard for {R}einforcement {L}earning {E}xperiments},
	Volume = {??},
	Year = {2009}}

@inproceedings{riedmiller:05,
	Author = {Martin Riedmiller},
	Booktitle = {European Conference on Machine Learning},
	Pages = {317-328},
	Title = {Neural Fitted Q Iteration - First Experiences with a Data Efficient Neural Reinforcement Learning Method.},
	Year = {2005}}

@phdthesis{bagnell:04,
	Address = {Pittsburgh, PA},
	Author = {James Bagnell},
	Month = {August},
	School = {Robotics Institute, Carnegie Mellon University},
	Title = {Learning Decisions: Robustness, Uncertainty, and Approximation},
	Year = {2004}}

@inproceedings{sutton:96,
	Author = {Richard S. Sutton},
	Booktitle = {Advances in Neural Information Processing Systems},
	Editor = {David S. Touretzky and Michael C. Mozer and Michael E. Hasselmo},
	Pages = {1038--1044},
	Publisher = {The {MIT} Press},
	Title = {Generalization in Reinforcement Learning: Successful Examples Using Sparse Coarse Coding},
	Volume = {8},
	Year = {1996}}

@misc{uci:98,
	Author = {D.J. Newman, S. Hettich, C.L. Blake and C.J. Merz},
	Institution = {University of California, Irvine, Dept. of Information and Computer Sciences},
	Title = {{UCI} Repository of machine learning databases},
	Url = {http://www.ics.uci.edu/$\sim$mlearn/MLRepository.html},
	Year = {1998},
	Bdsk-Url-1 = {http://www.ics.uci.edu/$%5Csim$mlearn/MLRepository.html}}

@misc{spec:95,
	Author = {Kathy Powers and Cathy Sandifer and Dianne Rice and Jason Glick and Bob Cramblitt},
	Title = {Standard Performance Evaluation Corporation},
	Url = {http://www.spec.org/},
	Year = {1995},
	Bdsk-Url-1 = {http://www.spec.org/}}

@inproceedings{matrix:97,
	Address = {London},
	Author = {Ronald F. Boisvert and Roldan Pozo and Karin Remington and Richard Barrett and Jack J. Dongarra},
	Booktitle = {Quality of Numerical Software, Assessment and Enhancement},
	Editor = {Ronald F. Boisvert},
	Pages = {125--137},
	Publisher = {Chapman \& Hall},
	Title = {The {Matrix Market}: {A} Web Resource for Test Matrix Collections},
	Year = {1997}}

@phdthesis{sturtevant:03,
	Author = {Nathan R. Sturtevant},
	School = {Computer Science Department, UCLA},
	Title = {Multi-Player Games: Algorithms and Approaches},
	Year = {2003}}
